from datasets import load_dataset


dataset = load_dataset("liwu/MNBVC", 'news_peoples_daily', num_proc=8, trust_remote_code=True)
dataset.save_to_disk("data/mnbvc/peoples_daily")
print(dataset)
print(dataset["train"][0])
